#ifndef __FLY_CUDA_REDUCE_H__
#define __FLY_CUDA_REDUCE_H__

#include "perf.h"

#include <stddef.h>

extern const size_t g_reduceBlockSize;

extern "C" void cuda_reduce_sum_double(const double* input, double* output, int size,
    int grid_size, int block_size);


#endif // __FLY_CUDA_REDUCE_H__